get-encoding:
	python core/get_encoding.py data/道诡异仙.txt

get-character-count:
	python core/get_character_count.py data/道诡异仙.txt 

conv-encoding:
	python core/conv_encoding.py data/我的治愈系游戏.txt --out 我的治愈系游戏.txt --encoding utf-8

split-regex:
	python core/split_regex.py data/道诡异仙.txt --pattern "\\u7b2c[\\u96f6|\\u4e00|\\u4e8c|\\u4e09|\\u56db|\\u4e94|\\u516d|\\u4e03|\\u516b|\\u4e5d|\\u5341|\\u767e|\\u5343]+\\u7ae0"

split-regex2:
	python core/split_regex.py data/我的治愈系游戏.txt --pattern "\\u7b2c\\d+\\u7ae0"

extract-chapter:
	python novel.py data/道诡异仙.txt --pattern "(\\u7b2c[\\u96f6|\\u4e00|\\u4e8c|\\u4e09|\\u56db|\\u4e94|\\u516d|\\u4e03|\\u516b|\\u4e5d|\\u5341|\\u767e|\\u5343]+\\u7ae0\\W+[^\\n]+)\\n"

extract-chapter2:
	python novel.py data/我的治愈系游戏.txt --pattern "(\\u7b2c\\d+\\u7ae0\\W+[^\\n]+)\\n"
	